#include <stdio.h>

__global__ void cuda_hello(){
	printf("[GPU] block=%d, thread=%d\n", blockIdx.x, threadIdx.x);
}

int main() {
	cuda_hello<<<3, 3>>>();
	printf("[Host] hello world before sync\n");
	cudaDeviceSynchronize();
	printf("[Host] hello world after sync\n");
	return 0;
}
